package com.terren.spider.util.common;

public class HtmlUtil {
	public static String removeTag(String htmlContent) {
		//去除标签内容
		htmlContent = htmlContent.replaceAll("<.*>", "");
		htmlContent = htmlContent.replaceAll("</[\\w-\\W-]*>", "");
		return htmlContent;
	}
}
